from transformers import AutoModel,AutoTokenizer
model_path = '/home/'
tokenizer = AutoTokenizer.from_pretrained(model_path,trust_remote_code=True)
model = AutoModel.from_pretrained(model_path,trust_remote_code=True).quantize(4)
model.eval()
response,history = model.chat(tokenizer,"晚上",history=[])


